build spacy custom ner model stackoverflow

build spacy custom ner model stackoverflow -

def main(model=None, output_dir=r'model', n_iter=100):
    """Load the model, set up the pipeline and train the entity recognizer."""
    if model is not None:
        nlp = spacy.load(model)  # load existing spaCy model
        print("Loaded model '%s'" % model)
    else:
        nlp = spacy.blank("en")  # create blank Language class
        print("Created blank 'en' model")

    # create the built-in pipeline components and add them to the pipeline
    # nlp.create_pipe works for built-ins that are registered with spaCy
    if "ner" not in nlp.pipe_names:
        ner = nlp.create_pipe("ner")
        nlp.add_pipe(ner, last=True)
    # otherwise, get it so we can add labels
    else:
        ner = nlp.get_pipe("ner")

    # add labels
    for _, annotations in TRAIN_DATA:
        for ent in annotations.get("entities"):
            ner.add_label(ent[2])

    # get names of other pipes to disable them during training
    other_pipes = [pipe for pipe in nlp.pipe_names if pipe != "ner"]
    with nlp.disable_pipes(*other_pipes):  # only train NER
        # reset and initialize the weights randomly – but only if we're
        # training a new model
        if model is None:
            nlp.begin_training()
        for itn in range(n_iter):
            random.shuffle(TRAIN_DATA)
            losses = {}
            # batch up the examples using spaCy's minibatch
            batches = minibatch(TRAIN_DATA, size=compounding(4.0, 32.0, 1.001))
            for batch in batches:
                texts, annotations = zip(*batch)
                nlp.update(
                    texts,  # batch of texts
                    annotations,  # batch of annotations
                    drop=0.5,  # dropout - make it harder to memorise data
                    losses=losses,
                )
            print("Losses", losses)

    # test the trained model
    for text, _ in TRAIN_DATA:
        doc = nlp(text)
        print("Entities", [(ent.text, ent.label_) for ent in doc.ents])
        print("Tokens", [(t.text, t.ent_type_, t.ent_iob) for t in doc])

    # save model to output directory
    if output_dir is not None:
        output_dir = Path(output_dir)
        if not output_dir.exists():
            output_dir.mkdir()
        nlp.to_disk(output_dir)
        print("Saved model to", output_dir)

Comments

Submit

0 Comments

More Questions

how to make a class in python	ModuleNotFoundError: No module named pip._internal	httpie on windows
python read json file	pandas create new column	python write to file
what is the use of class in python	install opencv python	rename columns pandas
rename columns in python	pip upgrade command	how to upgrade pip
command to upgrade the PIP	download pip install	command to update pip
how to upgrade pip in cmd	how to check python version	python iterate dictionary key value
python install pip	windows python pip upgrade	python virtual environment
how to update pip in python	how to read a file in python	how to update pip python
how to replace nan with 0 in pandas	check package version python	streamlit ssl error
networkx remove nodes with degree	get wd in python	find text between two strings regex python
create zero array in python	upgrade python version mc	python get image dimensions
pandas drop empty columns	summation django queryset	oddlyspecific09123890183019283
convert a dictionary into dataframe python	write dataframe to csv python	pygame draw circle
check value vowel user input python	remove commas from string python	No module named sklearn.cross_validation
pandas version check in python	convert column string to int pandas	python italic
python - prime number generator	.annotate unique distinct	current datetime pandas

build spacy custom ner model stackoverflow

build spacy custom ner model stackoverflow -

Comments

0 Comments

More Questions

C

CSS

Objective-C

PHP

Java

C++

Javascript

Html

Python

SQL

Swift

Ruby

Go

R

TypeScript

Kotlin

Assembly

VBA

Scala

Rust

Elixir

Dart

Haskell

Perl

Fortran

Matlab

Scheme

Julia

Lua

Delphi

Pascal

Solidity

BASIC

ActionScript

Csharp